package edu.ptit.jad.configuration;

/**
 * String constants used by topic mode algorithm
 * 
 * @author PhuongDo
 * 
 */
public class CONSTANTS {
	/*
	 * Regular expressions
	 */
	public static final String PUNCTUATION_REGEX = "[^a-zA-Z0-9]";
	public static final String REGEX_BRACES = "<.+?>";
	public static final String REGEX_NUMBERS = "\\d+[^a-zA-Z0-9]*";
	public static final String REGEX_SPACE = "\\s+";
	public static final String REGEX_SHORT_WORDS = "\\b[\\w]{1,2}\\b";
	public static final String REGEX_BACKSLASH = "\\\\";
	public static final String REGEX_FORWARDSLASH = "/";

	/*
	 * Other constants
	 */
	public static final String CHAR_SPACE = " ";
	public static final String URI_FILE_STRING = "file://";
	public static final String STRING_EMPTY = "";

	/*
	 * File constants
	 */

	public static final String FILE_DATA_TOK_ADS = "data/trains/ads.tok.jad";
	public static final String FILE_DATA_TOK_NEWS = "data/trains/news.tok.jad";

	public static final String FILE_DATA_ADS = "data/trains/ads.jad";
	public static final String FILE_DATA_NEWS = "data/trains/news.jad";
	public static final String FILE_DATA_CATES = "data/trains/cats.jad";

	public static final String FILE_DATA_NEWS_PRE = "data/preprocess/news.pre.jad";
	public static final String FILE_DATA_NEWS_TD_PRE = "data/preprocess/news_td.pre.jad";
	public static final String FILE_DATA_ADS_PRE = "data/preprocess/ads.pre.jad";

	/*
	 * File input
	 */

	public static final String FILE_AD_MATRIX = "data/input/ad_matrix.jad";

	/*
	 * File output
	 */

	public static final String FILE_OUT_TFIDF_SIMI = "data/output/tf_idf.simi.jad";
	public static final String FILE_OUT_TFIDF_TD_SIMI = "data/output/tf_idf_td.simi.jad";
	public static final String FILE_OUT_LDA_SIMI = "data/output/lda.simi.jad";
	public static final String FILE_OUT_AT_SIMI = "data/output/at.simi.jad";

	/*
	 * File Configurations
	 */

	public static final String FILE_CONFIG = "conf/app.properties";

	public static final String FILE_STOPWORDS = "data/dict/stopwords.jad";
	public static final String FILE_SYNONYMS = "data/dict/synonyms.jad";
	public static final String FILE_VOBS = "data/dict/vn_vobs.jad";

	public static void main(String[] args) {
		// String s = "121 2131 omkar asda 41234 1valid1";
		// System.out.println(s.replaceAll(REGEX_NUMBERS, "_"));
	}
}
